
# checking L2 home val against total
out = open_dataset('data/final_long/cycle=2020/') %>%
  filter(in_l2 == 1, in_cl == 1, total > 0, !is.na(home_val), multiple == 0) %>%
  select(home_val, total) %>%
  collect() %>%
  as.data.table()

samp = out[sample(1:nrow(out), 5e5)]

# save(samp, 'summary_data/figA2.rda') ## reidentifability
